@inproceedings{10.5555/2886521.2886647, 
	author = {Xu, Ran and Xiong, Caiming and Chen, Wei and Corso, Jason J.}, 
	title = {Jointly Modeling Deep Video and Compositional Text to Bridge Vision and Language in a Unified Framework}, 
	year = {2015}, 
	isbn = {0262511290}, 
	publisher = {AAAI Press}, 
	booktitle = {Proceedings of the Twenty-Ninth AAAI Conference on Artificial Intelligence}, 
	pages = {2346–2352}, 
	numpages = {7}, 
	location = {Austin, Texas}, 
	series = {AAAI’15} 
}